


from multiprocessing.reduction import duplicate

import pandas as  pd

df=pd.read_excel('./data/computer_2_old_2.xlsx')
df=df.drop(['min_salary','max_salary'],axis=1)
print(df.isna().sum())
duplicates=df.duplicated()
print(df[duplicates])
df=df.drop_duplicates()
df=df.reset_index(drop=True)
print(df.info())
from matplotlib import pyplot as plt
plt.rcParams['font.sans-serif']=['SimHei']
df.boxplot(column='salary(岳千皓)')
plt.show()
# df.to_excel('computer_2_new.xlsx',sheet_name='sheet1')